#!/bin/bash

set -x

export PYTHONUNBUFFERED=1

MODEL_PATH=/data1/modelscope/hub/models/Qwen/Qwen3-0.6B  # replace it with your local file path

python3 -m verl.trainer.main \
    config=examples/config.yaml \
    data.max_response_length=4096 \
    worker.actor.model.model_path=${MODEL_PATH} \
    worker.rollout.dtype=fp16 \
    worker.actor.fsdp.torch_dtype=fp16 \
    trainer.experiment_name=qwen3_0.6b_math_grpo \
    trainer.logger=['console','swanlab'] \
    trainer.n_gpus_per_node=2
